AOMedia AV1 Codec
firstpass.h
1/*
2 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3 *
4 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10 */
11
12#ifndef AOM_AV1_ENCODER_FIRSTPASS_H_
13#define AOM_AV1_ENCODER_FIRSTPASS_H_
14
15#include <stdbool.h>
16
17#include "av1/common/av1_common_int.h"
18#include "av1/common/enums.h"
20#include "av1/encoder/ratectrl.h"
21
22#ifdef __cplusplus
23extern "C" {
24#endif
25
26#define DOUBLE_DIVIDE_CHECK(x) ((x) < 0 ? (x)-0.000001 : (x) + 0.000001)
27
28#define MIN_ZERO_MOTION 0.95
29#define MAX_SR_CODED_ERROR 40
30#define MAX_RAW_ERR_VAR 2000
31#define MIN_MV_IN_OUT 0.4
32
33#define VLOW_MOTION_THRESHOLD 950
34struct ThreadData;
35
175
176// We want to keep one past stats for key frame detection
177// in test_candidate_kf()
178#define FIRSTPASS_INFO_STATS_PAST_MIN 1
179
180// The size of static buffer used in FIRSTPASS_INFO.
181#define FIRSTPASS_INFO_STATIC_BUF_SIZE \
182 (MAX_LAP_BUFFERS + FIRSTPASS_INFO_STATS_PAST_MIN)
183
187typedef struct {
197 FIRSTPASS_STATS static_stats_buf[FIRSTPASS_INFO_STATIC_BUF_SIZE];
215
222
227
232
237
243
257 FIRSTPASS_STATS *ext_stats_buf,
258 int ext_stats_buf_size);
259
267 FIRSTPASS_INFO *firstpass_info);
268
276
284 FIRSTPASS_INFO *firstpass_info);
285
295 const FIRSTPASS_STATS *input_stats);
296
309 const FIRSTPASS_INFO *firstpass_info, int offset_from_cur);
310
324 int offset_from_cur);
325
327#define FC_ANIMATION_THRESH 0.15
328enum {
329 FC_NORMAL = 0,
330 FC_GRAPHICS_ANIMATION = 1,
331 FRAME_CONTENT_TYPES = 2
332} UENUM1BYTE(FRAME_CONTENT_TYPE);
339typedef struct GF_GROUP {
341 // Frame update type, e.g. ARF/GF/LF/Overlay
342 FRAME_UPDATE_TYPE update_type[MAX_STATIC_GF_GROUP_LENGTH];
343 unsigned char arf_src_offset[MAX_STATIC_GF_GROUP_LENGTH];
344 // The number of frames displayed so far within the GOP at a given coding
345 // frame.
346 unsigned char cur_frame_idx[MAX_STATIC_GF_GROUP_LENGTH];
347 int layer_depth[MAX_STATIC_GF_GROUP_LENGTH];
348 int arf_boost[MAX_STATIC_GF_GROUP_LENGTH];
349 int max_layer_depth;
350 int max_layer_depth_allowed;
351 // This is currently only populated for AOM_Q mode
352 int q_val[MAX_STATIC_GF_GROUP_LENGTH];
353 int rdmult_val[MAX_STATIC_GF_GROUP_LENGTH];
354 int bit_allocation[MAX_STATIC_GF_GROUP_LENGTH];
355 // The frame coding type - inter/intra frame
356 FRAME_TYPE frame_type[MAX_STATIC_GF_GROUP_LENGTH];
357 // The reference frame buffer control - update or reset
358 REFBUF_STATE refbuf_state[MAX_STATIC_GF_GROUP_LENGTH];
359 int arf_index; // the index in the gf group of ARF, if no arf, then -1
360 int size; // The total length of a GOP
361
362 // The offset into lookahead_ctx for choosing
363 // source of frame parallel encodes.
364 int src_offset[MAX_STATIC_GF_GROUP_LENGTH];
365 // Stores the display order hint of each frame in the current GF_GROUP.
366 int display_idx[MAX_STATIC_GF_GROUP_LENGTH];
367
368 // The reference frame list maps the reference frame indexes to its
369 // buffer index in the decoded buffer. A value of -1 means the
370 // corresponding reference frame index doesn't point towards any
371 // previously decoded frame.
372 int8_t ref_frame_list[MAX_STATIC_GF_GROUP_LENGTH][REF_FRAMES];
373 // Update frame index
374 int update_ref_idx[MAX_STATIC_GF_GROUP_LENGTH];
375 // The map_idx of primary reference
376 int primary_ref_idx[MAX_STATIC_GF_GROUP_LENGTH];
377
378 // Indicates the level of parallelism in frame parallel encodes.
379 // 0 : frame is independently encoded (not part of parallel encodes).
380 // 1 : frame is the first in encode order in a given parallel encode set.
381 // 2 : frame occurs later in encode order in a given parallel encode set.
382 int frame_parallel_level[MAX_STATIC_GF_GROUP_LENGTH];
383 // Indicates whether a frame should act as non-reference frame.
384 bool is_frame_non_ref[MAX_STATIC_GF_GROUP_LENGTH];
385 // Indicates whether a frame is dropped.
386 bool is_frame_dropped[MAX_STATIC_GF_GROUP_LENGTH];
387
388 // Stores the display order hint of the frames not to be
389 // refreshed by the current frame.
390 int skip_frame_refresh[MAX_STATIC_GF_GROUP_LENGTH][REF_FRAMES];
391 // Stores the display order hint of the frame to be excluded during reference
392 // assignment.
393 int skip_frame_as_ref[MAX_STATIC_GF_GROUP_LENGTH];
394 // Indicates whether a switch frame is due.
395 bool is_sframe_due;
397} GF_GROUP;
400typedef struct {
401 // Track if the last frame in a GOP has higher quality.
402 int arf_gf_boost_lst;
403} GF_STATE;
404
405typedef struct {
406 FIRSTPASS_STATS *stats_in_start;
407 FIRSTPASS_STATS *stats_in_end;
408 FIRSTPASS_STATS *stats_in_buf_end;
409 FIRSTPASS_STATS *total_stats;
410 FIRSTPASS_STATS *total_left_stats;
411} STATS_BUFFER_CTX;
412
418typedef struct {
420 unsigned int section_intra_rating;
421 // Circular queue of first pass stats stored for most recent frames.
422 // cpi->output_pkt_list[i].data.twopass_stats.buf points to actual data stored
423 // here.
424 FIRSTPASS_STATS *frame_stats_arr[MAX_LAP_BUFFERS + 1];
425 int frame_stats_next_idx; // Index to next unused element in frame_stats_arr.
426 STATS_BUFFER_CTX *stats_buf_ctx;
427 FIRSTPASS_INFO firstpass_info; // This is the first pass data structure
428 // intended to replace stats_in
429 int first_pass_done;
430 int64_t bits_left;
431 double modified_error_min;
432 double modified_error_max;
433 double modified_error_left;
434
435 // Projected total bits available for a key frame group of frames
436 int64_t kf_group_bits;
437
438 // Error score of frames still to be coded in kf group
439 double kf_group_error_left;
440
441 // Over time correction for bits per macro block estimation
442 double bpm_factor;
443
444 // Record of target and actual bits spent in current ARF group
445 int rolling_arf_group_target_bits;
446 int rolling_arf_group_actual_bits;
447
448 int sr_update_lag;
449
450 int kf_zeromotion_pct;
451 int last_kfgroup_zeromotion_pct;
452 int extend_minq;
453 int extend_maxq;
455} TWO_PASS;
456
460typedef struct {
462 const FIRSTPASS_STATS *stats_in;
463 // Pointer to the stats of the current frame.
464 const FIRSTPASS_STATS *this_frame;
465 double mb_av_energy;
466 // An indication of the content type of the current frame
467 FRAME_CONTENT_TYPE fr_content_type;
468 double frame_avg_haar_energy;
471
474// This structure contains several key parameters to be accumulated for this
475// frame.
476typedef struct {
477 // Intra prediction error.
478 int64_t intra_error;
479 // Average wavelet energy computed using Discrete Wavelet Transform (DWT).
480 int64_t frame_avg_wavelet_energy;
481 // Best of intra pred error and inter pred error using last frame as ref.
482 int64_t coded_error;
483 // Best of intra pred error and inter pred error using golden frame as ref.
484 int64_t sr_coded_error;
485 // Count of motion vector.
486 int mv_count;
487 // Count of blocks that pick inter prediction (inter pred error is smaller
488 // than intra pred error).
489 int inter_count;
490 // Count of blocks that pick second ref (golden frame).
491 int second_ref_count;
492 // Count of blocks where the inter and intra are very close and very low.
493 double neutral_count;
494 // Count of blocks where intra error is very small.
495 int intra_skip_count;
496 // Start row.
497 int image_data_start_row;
498 // Count of unique non-zero motion vectors.
499 int new_mv_count;
500 // Sum of inward motion vectors.
501 int sum_in_vectors;
502 // Sum of motion vector row.
503 int sum_mvr;
504 // Sum of motion vector column.
505 int sum_mvc;
506 // Sum of absolute value of motion vector row.
507 int sum_mvr_abs;
508 // Sum of absolute value of motion vector column.
509 int sum_mvc_abs;
510 // Sum of the square of motion vector row.
511 int64_t sum_mvrs;
512 // Sum of the square of motion vector column.
513 int64_t sum_mvcs;
514 // A factor calculated using intra pred error.
515 double intra_factor;
516 // A factor that measures brightness.
517 double brightness_factor;
518} FRAME_STATS;
519
520// This structure contains first pass data.
521typedef struct {
522 // Buffer holding frame stats for all MACROBLOCKs.
523 // mb_stats[i] stores the FRAME_STATS of the ith
524 // MB in raster scan order.
525 FRAME_STATS *mb_stats;
526 // Buffer to store the prediction error of the (0,0) motion
527 // vector using the last source frame as the reference.
528 // raw_motion_err_list[i] stores the raw_motion_err of
529 // the ith MB in raster scan order.
530 int *raw_motion_err_list;
531} FirstPassData;
532
533struct AV1_COMP;
534struct EncodeFrameParams;
535struct AV1EncoderConfig;
536struct TileDataEnc;
537
538static inline int is_fp_wavelet_energy_invalid(
539 const FIRSTPASS_STATS *fp_stats) {
540 assert(fp_stats != NULL);
541 return (fp_stats->frame_avg_wavelet_energy < 0);
542}
543
544static inline BLOCK_SIZE get_fp_block_size(int is_screen_content_type) {
545 return (is_screen_content_type ? BLOCK_8X8 : BLOCK_16X16);
546}
547
548int av1_get_unit_rows_in_tile(const TileInfo *tile,
549 const BLOCK_SIZE fp_block_size);
550int av1_get_unit_cols_in_tile(const TileInfo *tile,
551 const BLOCK_SIZE fp_block_size);
552
553void av1_first_pass_row(struct AV1_COMP *cpi, struct ThreadData *td,
554 struct TileDataEnc *tile_data, const int mb_row,
555 const BLOCK_SIZE fp_block_size);
556void av1_end_first_pass(struct AV1_COMP *cpi);
557
558void av1_free_firstpass_data(FirstPassData *firstpass_data);
559
560void av1_twopass_zero_stats(FIRSTPASS_STATS *section);
561void av1_accumulate_stats(FIRSTPASS_STATS *section,
562 const FIRSTPASS_STATS *frame);
583void av1_first_pass(struct AV1_COMP *cpi, const int64_t ts_duration);
584
585void av1_noop_first_pass_frame(struct AV1_COMP *cpi, const int64_t ts_duration);
586#ifdef __cplusplus
587} // extern "C"
588#endif
589
590#endif // AOM_AV1_ENCODER_FIRSTPASS_H_
aom_codec_err_t
Algorithm return codes.
Definition aom_codec.h:155
aom_codec_err_t av1_firstpass_info_push(FIRSTPASS_INFO *firstpass_info, const FIRSTPASS_STATS *input_stats)
Push a stats into firstpass_info.
const FIRSTPASS_STATS * av1_firstpass_info_peek(const FIRSTPASS_INFO *firstpass_info, int offset_from_cur)
Peek at a stats from firstpass_info.
aom_codec_err_t av1_firstpass_info_move_cur_index(FIRSTPASS_INFO *firstpass_info)
Move cur_index by 1.
void av1_first_pass(struct AV1_COMP *cpi, const int64_t ts_duration)
AV1 first pass encoding.
aom_codec_err_t av1_firstpass_info_pop(FIRSTPASS_INFO *firstpass_info)
Pop a stats from firstpass_info.
aom_codec_err_t av1_firstpass_info_init(FIRSTPASS_INFO *firstpass_info, FIRSTPASS_STATS *ext_stats_buf, int ext_stats_buf_size)
Init firstpass_info.
aom_codec_err_t av1_firstpass_info_move_cur_index_and_pop(FIRSTPASS_INFO *firstpass_info)
Move cur_index by 1 and pop a stats from firstpass_info.
int av1_firstpass_info_future_count(const FIRSTPASS_INFO *firstpass_info, int offset_from_cur)
Count the future stats from the target in firstpass_info Note that the target stats will be counted a...
Describes look ahead buffer operations.
Main encoder configuration data structure.
Definition encoder.h:933
Top level encoder structure.
Definition encoder.h:2885
contains per-frame encoding parameters decided upon by av1_encode_strategy() and passed down to av1_e...
Definition encoder.h:3706
Data structure used for managing first pass stats.
Definition firstpass.h:187
int cur_index
Definition firstpass.h:226
int past_stats_count
Definition firstpass.h:236
int future_stats_count
Definition firstpass.h:231
int stats_buf_size
Definition firstpass.h:206
FIRSTPASS_STATS total_stats
Definition firstpass.h:241
int start_index
Definition firstpass.h:214
int stats_count
Definition firstpass.h:221
FIRSTPASS_STATS * stats_buf
Definition firstpass.h:202
The stucture of acummulated frame stats in the first pass.
Definition firstpass.h:43
double pcnt_neutral
Definition firstpass.h:90
double MVr
Definition firstpass.h:110
double MVc
Definition firstpass.h:118
double log_intra_error
Definition firstpass.h:169
double pcnt_second_ref
Definition firstpass.h:84
double mvr_abs
Definition firstpass.h:114
double pcnt_inter
Definition firstpass.h:74
double intra_error
Definition firstpass.h:58
double new_mv_count
Definition firstpass.h:140
double count
Definition firstpass.h:149
double coded_error
Definition firstpass.h:66
double raw_error_stdev
Definition firstpass.h:153
double pcnt_motion
Definition firstpass.h:78
double frame
Definition firstpass.h:48
double cor_coeff
Definition firstpass.h:165
double mv_in_out_count
Definition firstpass.h:136
double noise_var
Definition firstpass.h:161
double MVcv
Definition firstpass.h:130
double log_coded_error
Definition firstpass.h:173
int64_t is_flash
Definition firstpass.h:157
double inactive_zone_cols
Definition firstpass.h:106
double frame_avg_wavelet_energy
Definition firstpass.h:62
double duration
Definition firstpass.h:144
double sr_coded_error
Definition firstpass.h:70
double mvc_abs
Definition firstpass.h:122
double intra_skip_pct
Definition firstpass.h:98
double MVrv
Definition firstpass.h:126
double inactive_zone_rows
Definition firstpass.h:102
double weight
Definition firstpass.h:54
Data related to the current GF/ARF group and the individual frames within the group.
Definition firstpass.h:339
Frame level Two pass status and control data.
Definition firstpass.h:460
Two pass status and control data.
Definition firstpass.h:418